#!/usr/bin/env bash

# Train and test STAViS audiovisual models for all splits

base_path='./experiments'

# split=1
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --explain "multi fusion wo spatio_att and transposeConv" \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=2
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --explain "multi fusion wo spatio_att and transposeConv" \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=3
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --explain "multi fusion wo spatio_att and transposeConv" \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=1
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_multiScale \
#     --explain "multi fusion wo spatio_att, transposeConv and dsam_multiScale" \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=1
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_scheduler \
#     --explain "multi fusion bilinear upsamp" \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=1
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "nearest" \
#     --no_test \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_scheduler \
#     --explain "multiFusion ks=3 nearest upsample" \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=1
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --no_test \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_scheduler \
#     --explain "multiFusion ks=3 bilinear upsample" \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=1
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear upsamp" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=1
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --no_test \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_multiScale \
#     --explain "multi fusion bilinear upsamp wo dsam_multiScale" \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=2
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear upsamp" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_scheduler \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=2
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_scheduler \
#     --no_use_dsam_multiScale \
#     --explain "multi fusion bilinear upsamp wo dsam_multiScale" \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=3
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear upsamp" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_scheduler \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=3
# python main.py --gpu_devices 0,1,2,3 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_multiScale \
#     --no_scheduler \
#     --explain "multi fusion bilinear upsamp wo dsam_multiScale" \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# --resume_path "./experiments/202011192150/save_40.pth" \
# --pool_layer "tempAvg" \
# --no_scheduler \
# --learning_rate 0.01 \
# --temp_reduction 2 \
# --attn_dropout 0.1 \
# --num_heads 5 \

# 202011192332
# 202011200103
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --no_train \
#     --no_val \
#     --resume_path ./experiments/202011192332/save_40.pth \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --attn_dropout 0.1 \
#     --num_heads 5 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear tempAvg" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --attn_dropout 0.1 \
#     --num_heads 5 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear tempAvg" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --attn_dropout 0.1 \
#     --num_heads 5 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear tempAvg" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#

# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --learning_rate 0.000001 \
#     --lr_transformer 0.000001 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_test \
#     --no_scheduler \
#     --audiovisual True --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011232222/save_40.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --learning_rate 0.0001 \
#     --lr_transformer 0.0001 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion bilinear audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_multiScale \
#     --no_test \
#     --audiovisual True --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/visual_multi_train_test/split${split}_results/save_40.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion baseline" \
#     --no_test \
#     --no_scheduler \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_test \
#     --no_scheduler \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 4 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=4" \
#     --no_test \
#     --no_scheduler \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2 audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011282009/save_20.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_test \
#     --no_scheduler \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_test \
#     --no_scheduler \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2 audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011290108/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2 audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011290126/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./audiovisual_final_test/split1_results \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --no_train \
#     --no_val \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2 audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011290038/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./audiovisual_final_test/split2_results \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --no_train \
#     --no_val \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2 audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011291110/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./audiovisual_final_test/split3_results \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --no_train \
#     --no_val \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2 audiovisual" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 10 --n_epochs 20 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011291139/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_test \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_test \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_test \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 10 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011292116/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011292209/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt
#
#
# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./experiments/202011292302/save_best.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt


# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_only_test/split1_results \
#     --no_train \
#     --no_val \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --resume_path ./experiments/202011292116/save_best.pth \
#     --audio_pretrain_path "" \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_only_test/split2_results \
#     --no_train \
#     --no_val \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --resume_path ./experiments/202011292209/save_best.pth \
#     --audio_pretrain_path "" \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt


# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_only_test/split1_results \
#     --no_train \
#     --no_val \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --resume_path ./experiments/202011292302/save_best.pth \
#     --audio_pretrain_path "" \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./audiovisual_multi_test2/split1_results \
#     --no_train \
#     --no_val \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --resume_path ./experiments/202011300004/save_best.pth \
#     --audio_pretrain_path "" \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./audiovisual_multi_test2/split2_results \
#     --no_train \
#     --no_val \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --resume_path ./experiments/202011300111/save_best.pth \
#     --audio_pretrain_path "" \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt


# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./audiovisual_multi_test2/split3_results \
#     --no_train \
#     --no_val \
#     --dataset split${split} \
#     --pool_layer "tempAvg" \
#     --use_transformer \
#     --num_heads 8 \
#     --attn_dropout 0.1 \
#     --lr_transformer 0.001 \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "multi fusion tempAvg temp_reduction=2" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --no_use_dsam_att \
#     --no_use_dsam_multiScale \
#     --audiovisual True --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --resume_path ./experiments/202011300217/save_best.pth \
#     --audio_pretrain_path "" \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# python eval_multiprocess.py --base_path /media/Diskd/projects/STAViS_AV \
# --eval_path experiments/audiovisual_multi_test2

split=1
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_multi_test3/split1_results \
    --dataset split${split} \
    --pool_layer "tempAvg" \
    --learning_rate 0.01 \
    --temp_reduction 2 \
    --use_transformer \
    --num_heads 8 \
    --attn_dropout 0.1 \
    --lr_transformer 0.001 \
    --upsample_func "bilinear" \
    --explain "multi fusion tempAvg temp_reduction=2" \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 60 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/202011292116/save_best.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

split=2
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_multi_test3/split2_results \
    --dataset split${split} \
    --pool_layer "tempAvg" \
    --use_transformer \
    --num_heads 8 \
    --attn_dropout 0.1 \
    --lr_transformer 0.001 \
    --learning_rate 0.01 \
    --temp_reduction 2 \
    --upsample_func "bilinear" \
    --explain "multi fusion tempAvg temp_reduction=2" \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 60 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/202011292209/save_best.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt


split=3
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_multi_test3/split3_results \
    --dataset split${split} \
    --pool_layer "tempAvg" \
    --use_transformer \
    --num_heads 8 \
    --attn_dropout 0.1 \
    --lr_transformer 0.001 \
    --learning_rate 0.01 \
    --temp_reduction 2 \
    --upsample_func "bilinear" \
    --explain "multi fusion tempAvg temp_reduction=2" \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 60 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/202011292302/save_best.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

python eval_multiprocess.py --base_path /media/Diskd/projects/STAViS_AV \
--eval_path experiments/audiovisual_multi_test3
